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, ) 



SEQUENCE LISTING 



[0 



<120> T1R TASTE RECEPTORS AND GENES ENCODING SAME 

<130> 078003-0280681 

<140> 10/035,045 
<141> 2002-01-03 



<150> 60/259,227 

<151> 2001-01-03 

<150> 60/284,547 

<151> 2001-04-19 



<160> 24 



<170> Patentln Ver. 2.1 



<210> 1 

<211> 876 

<212> DNA 

<213> Homo sapiens 



<400> 1 

agcctggcag tggcctcagg cagagtctga 
ggacaccact ggggccccag ggtgtggcaa 
tcctctgccc gctccccgcc ccgggctcac 
ctgccgtgcc tgttggaagt tgcctctgcc 
ctctgggctc tcctgcaccc tgggacgggg 
atgaaggggg actacgtgct gggggggctg 
ctccgcagcc ggacacggcc cagcagccct 
tgggtcgggg tcagggtgac caggtctggg 
ctgcggttct gtgtggcccc aggttctcct 
aaatggccgt ggaggagatc aacaacaagt 
acgacctctt tgatacgtgc tcggagcctg 
tggccaaggc aggcagccgc gacatcgccg 
gtgtgctggc tgtcatcggg ccccactcgt 
tcagcttctt cctcatgccc cagtggggcg 
cctgccccgt gggagcccct tgtgtcagga 



cgcgcacaaa ctttcaggcc caggaagcga 60 
gtgaggatgg caagggtttt gctaaacaaa 120 
tccatgtgag gccccagtcg gggcagccac 180 
atgctgggcc ctgctgtcct gggcctcagc 240 
gccccattgt gcctgtcaca gcaacttagg 300 
ttccccctgg gcgaggccga ggaggctggc 360 
gtgtgcacca ggtacagagg tgggacggcc 420 
gtgctcctga gctggggccg aggtggccat 480 
caaacggcct gctctgggca ctggccatga 540 
cggatctgct gcccgggctg cgcctgggct 600 
tggtggccat gaagcccagc ctcatgttcc 660 
cctactgcaa ctacacgcag taccagcccc 720 
cagagctcgc catggtcacc ggcaagttct 780 
ccccccacca tcacccaccc ccaaccaacc 840 
gaatgc 876 



<210> 2 

<211> 2687 

<212> DNA 

<213> Homo sapiens 



<400> 2 

tacatgcacc ccacccagcc ctgccctggg 
gcaggtcagc tacggtgcta gcatggagct 
cttccgcacc gtgcccagcg accgtgtgca 
gttcggctgg aactgggtgg ccgccctggg 



agccctgtgt cagaagatgc tcttggcctt 60 
gctgagcgcc cgggagacct tcccctcctt 120 
gctgacggcc gccgcggagc tgctgcagga 18 0 
cagcgacgac gagtacggcc ggcagggcct 24 0 



gagcatcttc 
gccgctgccc 
gaaccagagc 
cttcaactac 
gctgacctct 
cttcctccag 
cctggccacc 
ggacgtggtg 
agggctaaat 
cctgcacaac 
ctggcaggtg 
gcacggccac 
gctcctggag 
cagcagcgga 
gcccaggctc 
ccgctggcac 
gtagcccccg 
gcccagccga 
cggcagtgcc 
tgtgtggact 
gcgggggtgg 
cacagggtac 
accttttgtg 
tctcggttcc 
gcgctgggcc 
gttcaggcct 
ctcagcgtcc 
ttgtcccacc 
ttcgtggagt 
ccctgggcct 
tacctggtgg 
ctggtgcact 
acgctggcct 
aaccgtgccc 
gtgcccctcc 
ctgctctgtg 
cggcagccag 
ggccagaatg 
tcagccccgg 
tcgctacaga 
cacagtgagc 



tcggccctgg 
cgtgccgatg 
agcgtgcagg 
agcatcagca 
gacctggtca 
aggggtgccc 
gacccggcct 
ggccagcgct 
caccaccaga 
actcttcagt 
agcccgggag 
cacgcctgag 
aacatgtaca 
aacgtggaca 
cacgacgtgg 
acgtctgaca 
cggcagggcg 
gcagagccag 

aggagggcca 

gcgaggcggg 
gaacgcagca 
aagacgaaca 
gccaggatga 
tggcatgggg 
ttgtgctggc 

cgggggggcc 
tcctgttccc 
tcccgctcac 
cagaactgcc 
ggctggtggt 
ccttcccgcc 
gccgcacacg 
ttctctgctt 
gtggcctcac 
tggccaatgt 
tcctgggcat 
ggctcaacac 
acgggaacac 
tgaacccaga 
gaccctcccg 
cctaggcctg 



ccgcggcacg 
actcgcggct 

tggtgctgct 

gcaggctctc 
tggggctgcc 
agctgcacga 
tctgctctgc 
gcccgcagtg 
cgttctctgt 
gcaacgcctc 
atgggggtgt 
ctggaggtgg 
acctgacctt 
tggagtacga 
gcaggttcaa 
accaggtgag 
cagcctgggg 
accccaggcc 
ggtgcgccgg 
cagctaccgg 
ggggagggtc 
cccagcgccc 
gtggtccccg 
cgagccggct 
tgctttgggg 
cctggcctgc 
tggccagccc 
gggctgcctg 
tctgagctgg 
gctgctggcc 
ggaggtggtg 
ctcctgggtc 
cctgggcact 
ctttgccatg 
gcaggtggtc 
cctggctgcc 
ccccgagttc 
aggaaatcag 
cttagctgcg 
ctctaggttc 
gagcacgtgg 



cggcatctgc 
ggggaaggtg 
gttcgcctcc 
gcccaaggtg 
cggcatggcc 
gttcccccag 
cctgggcgag 
tgactgcatc 
ctacgcagct 
aggctgcccc 
gctgtcctct 
ctggcggctc 
ccacgtgggc 
cctgaagctg 
cggcagcctc 
gtgagggtgg 
gtgggggccg 
tgtgcgcaga 
gtcaaggggt 
caaaacccag 
ctgccaagtc 
ttctcctctc 
gagcgaagca 
gtgctgctgc 
ctgttcgttc 
tttggcctgg 
agccctgccc 
agcacactct 
gcagaccggc 
atgctggtgg 
acggactggc 
agcttcggcc 
ttcctggtgc 
ctggcctact 
ctcaggcccg 
ttccacctgc 
ttcctgggag 
gggaaacatg 
atccccccca 
tgaccccagg 
acacccctgt 



atcgcgcacg 
caggacgtcc 
gtgcacgccg 
tgggtggcca 
cagatgggca 
tacgtgaaga 
agggagcagg 
acgctgcaga 
gtgtatagcg 
gcgcaggacc 
gcatgtgccc 
agccccgtcc 
gggctgccgc 
tgggtgtggc 
aggacagagc 
gtgtgccagg 
ttccagtctc 
agcccgtgtc 
tccactcctg 
gtgagccgcc 
ctgactctga 
tcacagacga 
cacgctgctt 
tgctcctgct 
accatcggga 
tgtgcctggg 
gatgcctggc 
tcctgcaggc 
tgagtggctg 
aggtcgcact 
acatgctgcc 
tagcgcacgc 
ggagccagcc 
tcatcacctg 
ccgtgcagat 
ccaggtgtta 
ggggccctgg 
agtgacccaa 
agccagcaat 
ttgtctcctg 
gaccatc 



a gggcctggt 

tgcaccaggt 
cccacgccct 
gcgaggcctg 
cggtgcttgg 
cgcacctggc 
gtctggagga 
acgtgagcgc 
tggcccaggc 
ccgtgaagcc 
aggccaccag 
cccgcccgca 

tgcggttcga 

agggctcagt 
gcctgaagat 
cgtgcccgtg 
ccgtgggcat 
ccggtgctcg 
ctgctacgac 
ttcccggcag 
gaccagagcc 
catcgcctgc 
ccgccgcagg 
gctgagcctg 
cagcccactg 
cctggtctgc 
ccagcagccc 
ggccgagatc 
cctgcggggg 
gtgcacctgg 
cacggaggcg 
caccaatgcc 
gggctgctac 
ggtctccttt 
gggcgccctc 
cctgctcatg 
ggatgcccaa 
ccctgtgatc 
gacccgtgtc 
accctgaccc 



300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2580 

2640 

2687 



<210> 3 

<211> 2559 

<212> DNA 

<213> Homo sapiens 

<400> 3 

atgctgggcc ctgctgtcct gggcctcagc ctctgggctc tcctgcaccc tgggacgggg 60 
gccccattgt gcctgtcaca gcaacttagg atgaaggggg actacgtgct gggggggctg 120 
ttccccctgg gcgaggccga ggaggctggc ctccgcagcc ggacacggcc cagcagccct 180 
gtgtgcacca ggttctcctc aaacggcctg ctctgggcac tggccatgaa aatggccgtg 240 
gaggagatca acaacaagtc ggatctgctg cccgggctgc gcctgggcta cgacctcttt 300 
gatacgtgct cggagcctgt ggtggccatg aagcccagcc tcatgttcct ggccaaggca 360 
ggcagccgcg acatcgccgc ctactgcaac tacacgcagt accagccccg tgtgctggct 420 
gtcatcgggc cccactcgtc agagctcgcc atggtcaccg gcaagttctt cagcttcttc 480 
ctcatgcccc aggtcagcta cggtgctagc atggagctgc tgagcgcccg ggagaccttc 54 0 



ccctccttct 
ctgcaggagt 
cagggcctga 
ggcctggtgc 
caccaggtga 
cacgccctct 
gaggcctggc 
gtgcttggct 
cacctggccc 
ctggaggagg 
gtgagcgcag 
gcccaggccc 
gtgaagccct 
ccgctgcggt 
tggcagggct 
gagcgcctga 
cggcagtgcc 
tgtgtggact 
tgtggccagg 
ttcctggcat 
ggccttgtgc 
gcctcggggg 
gtcctcctgt 
cacctcccgc 
gagtcagaac 
gcctggctgg 
gtggccttcc 
cactgccgca 
gcctttctct 
gcccgtggcc 
ctcctggcca 
tgtgtcctgg 
ccagggctca 
aatgacggga 



tccgcaccgt 
tcggctggaa 
gcatcttctc 
cgctgccccg 
accagagcag 
tcaactacag 
tgacctctga 
tcctccagag 
tggccaccga 
acgtggtggg 
ggctaaatca 
tgcacaacac 
ggcagctcct 
tcgacagcag 
cagtgcccag 
agatccgctg 
aggagggcca 
gcgaggcggg 
atgagtggtc 
ggggcgagcc 
tggctgcttt 
ggcccctggc 
tccctggcca 
tcacgggctg 
tgcctctgag 

tggtgctgct 

cgccggaggt 
cacgctcctg 
gcttcctggg 
tcacctttgc 
atgtgcaggt 
gcatcctggc 
acacccccga 
acacaggaaa 



gcccagcgac 
ctgggtggcc 
ggccctggcc 
tgccgatgac 
cgtgcaggtg 
catcagcagc 
cctggtcatg 
gggtgcccag 
cccggccttc 
ccagcgctgc 
ccaccagacg 
tcttcagtgc 
ggagaacatg 
cggaaacgtg 
gctccacgac 
gcacacgtct 
ggtgcgccgg 
cagctaccgg 
cccggagcga 
ggctgtgctg 

ggggctgttc 

ctgctttggc 
gcccagccct 
cctgagcaca 
ctgggcagac 
ggccatgctg 
ggtgacggac 
ggtcagcttc 
cactttcctg 
catgctggcc 
ggtcctcagg 
tgccttccac 
gttcttcctg 
tcaggggaaa 



cgtgtgcagc 
gccctgggca 
gcggcacgcg 
tcgcggctgg 
gtgctgctgt 
aggctctcgc 
gggctgcccg 
ctgcacgagt 
tgctctgccc 
ccgcagtgtg 
ttctctgtct 
aacgcctcag 
tacaacctga 
gacatggagt 
gtgggcaggt 
gacaaccaga 
gtcaaggggt 
caaaacccag 
agcacacgct 
ctgctgctcc 
gttcaccatc 
ctggtgtgcc 
gcccgatgcc 
ctcttcctgc 
cggctgagtg 
gtggaggtcg 
tggcacatgc 
ggcctagcgc 
gtgcggagcc 
tacttcatca 
cccgccgtgc 
ctgcccaggt 
ggagggggcc 
catgagtga 



tgacggccgc 
gcgacgacga 
gcatctgcat 
ggaaggtgca 
tcgcctccgt 
ccaaggtgtg 
gcatggccca 
tcccccagta 
tgggcgagag 
actgcatcac 
acgcagctgt 
gctgccccgc 
ccttccacgt 
acgacctgaa 
tcaacggcag 
agcccgtgtc 
tccactcctg 
acgacatcgc 
gcttccgccg 
tgctgctgag 
gggacagccc 
tgggcctggt 
tggcccagca 
aggcggccga 
gctgcctgcg 
cactgtgcac 
tgcccacgga 
acgccaccaa 
agccgggctg 
cctgggtctc 
agatgggcgc 
gttacctgct 
ctggggatgc 



cgcggagctg 
gtacggccgg 
cgcgcacgag 
ggacgtcctg 
gcacgccgcc 
ggtggccagc 
gatgggcacg 
cgtgaagacg 
ggagcagggt 
gctgcagaac 
gtatagcgtg 
gcaggacccc 
gggcgggctg 
gctgtgggtg 
cctcaggaca 
ccggtgctcg 
ctgctacgac 
ctgcaccttt 
caggtctcgg 
cctggcgctg 
actggttcag 
ctgcctcagc 
gcccttgtcc 
gatcttcgtg 
ggggccctgg 
ctggtacctg 
ggcgctggtg 
tgccacgctg 
ctacaaccgt 
ctttgtgccc 
cctcctgctc 
catgcggcag 
ccaaggccag 



600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2559 



<210> 4 
<211> 852 
<212> PRT 

<213> Homo sapiens 



<400> 4 

Met Leu Gly Pro 
1 

Pro Gly Thr Gly 
20 

Gly Asp Tyr Val 
35 

Ala Gly Leu Arg 
50 

Phe Ser Ser Asn 
65 



Ala Val Leu Gly 
5 

Ala Pro Leu Cys 

Leu Gly Gly Leu 
40 

Ser Arg Thr Arg 
55 

Gly Leu Leu Trp 
70 



Leu Ser Leu Trp 
10 

Leu Ser Gin Gin 
25 

Phe Pro Leu Gly 



Pro Ser Ser Pro 
60 

Ala Leu Ala Met 
75 



Ala Leu Leu His 
15 

Leu Arg Met Lys 
30 

Glu Ala Glu Glu 
45 

Val Cys Thr Arg 



Lys Met Ala Val 
80 



Glu Glu lie Asn Asn Lys Ser Asp Leu Leu Pro Gly Leu Arg Leu Gly 
85 90 95 

Tyr Asp Leu Phe Asp Thr Cys Ser Glu Pro Val Val Ala Met Lys Pro 
100 105 110 

Ser Leu Met Phe Leu Ala Lys Ala Gly Ser Arg Asp lie Ala Ala Tyr 
115 120 ~ 125 

Cys Asn Tyr Thr Gin Tyr Gin Pro Arg Val Leu Ala Val lie Gly Pro 
130 135 140 

His Ser Ser Glu Leu Ala Met Val Thr Gly Lys Phe Phe Ser Phe Phe 
145 150 155 160 

Leu Met Pro Gin Val Ser Tyr Gly Ala Ser Met Glu Leu Leu Ser Ala 
165 170 175 

Arg Glu Thr Phe Pro Ser Phe Phe Arg Thr Val Pro Ser Asp Arg Val 
180 185 190 

Gin Leu Thr Ala Ala Ala Glu Leu Leu Gin Glu Phe Gly Trp Asn Trp 
195 200 205 

Val Ala Ala Leu Gly Ser Asp Asp Glu Tyr Gly Arg Gin Gly Leu Ser 
210 215 220 

lie Phe Ser Ala Leu Ala Ala Ala Arg Gly He Cys He Ala His Glu 
225 230 235 ' 240 

Gly Leu Val Pro Leu Pro Arg Ala Asp Asp Ser Arg Leu Gly Lys Val 
245 250 255 

Gin Asp Val Leu His Gin Val Asn Gin Ser Ser Val Gin Val Val Leu 
260 265 270 

Leu Phe Ala Ser Val His Ala Ala His Ala Leu Phe Asn Tyr Ser He 
275 280 285 

Ser Ser Arg Leu Ser Pro Lys Val Trp Val Ala Ser Glu Ala Trp Leu 
290 295 300 

Thr Ser Asp Leu Val Met Gly Leu Pro Gly Met Ala Gin Met Gly Thr 
305 310 315 320 

Val Leu Gly Phe Leu Gin Arg Gly Ala Gin Leu His Glu Phe Pro Gin 
325 330 335 

Tyr Val Lys Thr His Leu Ala Leu Ala Thr Asp Pro Ala Phe Cys Ser 
340 345 350 

Ala Leu Gly Glu Arg Glu Gin Gly Leu Glu Glu Asp Val Val Gly Gin 
355 360 365 



Arg Cys Pro Gin Cys Asp Cys He Thr Leu Gin Asn Val Ser Ala Gly 
370 375 380 



) 



Leu Asn His His Gin Thr Phe Ser Val Tyr Ala Ala Val Tyr Ser Val 
385 390 395 400 

Ala Gin Ala Leu His Asn Thr Leu Gin Cys Asn Ala Ser Gly Cys Pro 
405 410 415 

Ala Gin Asp Pro Val Lys Pro Trp Gin Leu Leu Glu Asn Met Tyr Asn 
420 425 430 

Leu Thr Phe His Val Gly Gly Leu Pro Leu Arg Phe Asp Ser Ser Gly 
435 440 445 

Asn Val Asp Met Glu Tyr Asp Leu Lys Leu Trp Val Trp Gin Gly Ser 
450 455 460 

Val Pro Arg Leu His Asp Val Gly Arg Phe Asn Gly Ser Leu Arg Thr 
465 470 475 480 

Glu Arg Leu Lys lie Arg Trp His Thr Ser Asp Asn Gin Lys Pro Val 
485 490 495 

Ser Arg Cys Ser Arg Gin Cys Gin Glu Gly Gin Val Arg Arg Val Lys 
500 505 510 

Gly Phe His Ser Cys Cys Tyr Asp Cys Val Asp Cys Glu Ala Gly Ser 
515 520 525 

Tyr Arg Gin Asn Pro Asp Asp lie Ala Cys Thr Phe Cys Gly Gin Asp 
530 535 540 

Glu Trp Ser Pro Glu Arg Ser Thr Arg Cys Phe Arg Arg Arg Ser Arg 
545 550 555 560 

Phe Leu Ala Trp Gly Glu Pro Ala Val Leu Leu Leu Leu Leu Leu Leu 
565 570 575 

Ser Leu Ala Leu Gly Leu Val Leu Ala Ala Leu Gly Leu Phe Val His 
580 585 590 

His Arg Asp Ser Pro Leu Val Gin Ala Ser Gly Gly Pro Leu Ala Cys 
595 600 ' 605 

Phe Gly Leu Val Cys Leu Gly Leu Val Cys Leu Ser Val Leu Leu Phe 
610 615 620 

Pro Gly Gin Pro Ser Pro Ala Arg Cys Leu Ala Gin Gin Pro Leu Ser 
625 630 635 640 

His Leu Pro Leu Thr Gly Cys Leu Ser Thr Leu Phe Leu Gin Ala Ala 
645 650 655 

Glu lie Phe Val Glu Ser Glu Leu Pro Leu Ser Trp Ala Asp Arg Leu 
660 665 670 

Ser Gly Cys Leu Arg Gly Pro Trp Ala Trp Leu Val Val Leu Leu Ala 
675 680 685 



) 



Met Leu Val Glu Val Ala Leu Cys Thr Trp Tyr Leu Val Ala Phe Pro 
690 695 700 

Pro Glu Val Val Thr Asp Trp His Met Leu Pro Thr Glu Ala Leu Val 
705 710 715 720 

His Cys Arg Thr Arg Ser Trp Val Ser Phe Gly Leu Ala His Ala Thr 
725 730 735 

Asn Ala Thr Leu Ala Phe Leu Cys Phe Leu Gly Thr Phe Leu Val Arg 
740 745 750 

Ser Gin Pro Gly Cys Tyr Asn Arg Ala Arg Gly Leu Thr Phe Ala Met 
755 760 765 

Leu Ala Tyr Phe lie Thr Trp Val Ser Phe Val Pro Leu Leu Ala Asn 
770 775 780 

Val Gin Val Val Leu Arg Pro Ala Val Gin Met Gly Ala Leu Leu Leu 
785 790 795 800 

Cys Val Leu Gly lie Leu Ala Ala Phe His Leu Pro Arg Cys Tyr Leu 
805 810 815 

Leu Met Arg Gin Pro Gly Leu Asn Thr Pro Glu Phe Phe Leu Gly Gly 
820 825 830 

Gly Pro Gly Asp Ala Gin Gly Gin Asn Asp Gly Asn Thr Gly Asn Gin 
835 840 845 

Gly Lys His Glu 
850 



<210> 5 
<211> 23 
<212> DNA 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Primer 
<220> 

<221> modif ied_base 
<222> (3) 

<22 3> a, t, c, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (9) 

<223> a, t, c, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (12) 

<223> a, t, c, g, other or unknown 



1 



1 

<220> 

<221> modif ied_base 
<222> (18) 

<223> a, t, c, g, other or unknown 
<400> 5 

cgnttyytng cntggggnga rcc 23 



<210> 6 
<211> 23 
<212> DNA 

<213> Artificial Sequence 



<220> 

<223> Description of Artificial Sequence: Primer 
<220> 

<221> modif ied_base 
<222> (3) 

<223> a, t, c, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (6) 

<2 23> a, t, c, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (18) 

<223> a, t, c, g, other or unknown 
<220> 

<221> modif ied_base 
<222> (21) 

<223> a, t, c, g, other or unknown 
<400> 6 

cgngcncgrt trtarcancc ngg 23 



<210> 7 

<211> 9 

<212> PRT 

<213> Homo sapiens 

<400> 7 — _ _ — 

Arg Phe Leu Ala Trp Gly Glu Pro Ala 
1 5 



<210> 8 

<211> 8 

<212> PRT 

<213> Homo sapiens 



8 

<400> 8 

Pro Gly Cys Tyr Asn Arg Ala Arg 
1 5 



<210> 9 
<211> 552 
<212> DNA 
<213> Mus sp. 



<400> 9 

gtgctgtcac 

ctctctgtcc 

tttggcctga 

agctctgcca 

agcacactct 

gcaaactggc 

tttgtggagg 

tggtcagtgc 

ggcttggtgc 

gtacaagacc 



tcctcctgct 
accactggga 
tctgcctagg 
gctgccttgc 
tcctgcaagc 
tatgcagcta 
cagcactatg 
tgcccacaga 
acatcaccaa 
ag 



gctttgcctg 
cagccctctt 
cctcttctgc 
acaacaacca 
agctgagacc 
ccttcgggac 
tgcctggtat 
ggtactggag 
tgcaatggta 



gtgctgggtc 
gtccaggcct 
ctcagtgtcc 
atggctcacc 
tttgtggagt 
tctggcctgc 
ttgaccgctt 
cactgccacg 
gcttttctct 



tagcactggc 
caggcggctc 
ttctgttccc 
tccctctcac 
ctgagctgcc 
tagtggtact 
caccagaagt 
tgcgttcctg 
gctttctggg 



tgctctgggg 60 
acagttctgc 120 
aggacggcca 180 
aggctgcctg 240 
actgagctgg 3 00 
gttggccact 360 
ggtgacagac 420 
ggtcaacctg 480 
cactttcctg 540 
552 



<210> 10 
<211> 184 
<212> PRT 
<213> Mus sp . 



<400> 10 
Val Leu Ser Leu 
1 

Ala Ala Leu Gly 
20 

Ala Ser Gly Gly 
35 

Phe Cys Leu Ser 
50 

Cys Leu Ala Gin 
65 

Ser Thr Leu Phe 



Pro Leu Ser Trp 
100 

Leu Leu Val Val 
115 

Trp Tyr Leu Thr 
130 

Pro Thr Glu Val 
145 



Leu Leu Leu Leu 
5 

Leu Ser Val His 



Ser Gin Phe Cys 
40 

Val Leu Leu Phe 
55 

Gin Pro Met Ala 
70 

Leu Gin Ala Ala 
85 

Ala Asn Trp Leu 



Leu Leu Ala Thr 
120 

Ala Ser Pro Glu 
135 

Leu Glu His Cys 
150 



Cys Leu Val Leu 
10 

His Trp Asp Ser 
25 

Phe Gly Leu lie 



Pro Gly Arg Pro 
60 

His Leu Pro Leu 
75 

Glu Thr Phe Val 
90 

Cys Ser Tyr Leu 
105 

Phe Val Glu Ala 



Val Val Thr Asp 
140 

His Val Arg Ser 
155 



Gly Leu Ala Leu 
15 

Pro Leu Val Gin 
30 

Cys Leu Gly Leu 
45 

Ser Ser Ala Ser 



Thr Gly Cys Leu 
80 

Glu Ser Glu Leu 
95 

Arg Asp Ser Gly 
110 

Ala Leu Cys Ala 
125 

Trp Ser Val Leu 



Trp Val Asn Leu 
160 



Gly Leu Val His lie Thr Asn Ala Met Val Ala Phe Leu Cys Phe Leu 
165 170 175 



Gly Thr Phe Leu Val Gin Asp Gin 
180 



<210> 11 
<211> 558 
<212> DNA 
<213> Rattus sp . 

<400> 11 

gtgctgtcac ttctcctgct gctttgcctg gtgctgggcc tgacactggc tgccctgggg 60 

ctctttgtcc actactggga cagccctctt gttcaggcct caggtgggtc actgttctgc 120 

tttggcctga tctgcctagg cctcttctgc ctcagtgtcc ttctgttccc aggacgacca 180 

cgctctgcca gctgccttgc ccaacaacca atggctcacc tccctctcac aggctgcctg 240 

agcacactct tcctgcaagc agccgagatc tttgtggagt ctgagctgcc actgagttgg 3 00 

gcaaactggc tctgcagcta ccttcggggc ccctgggctt ggctggtggt actgctggcc 360 

actcttgtgg aggctgcact atgtgcctgg tacttgatgg ctttccctcc agaggtggtg 420 

acagattggc aggtgctgcc cacggaggta ctggaacact gccgcatgcg ttcctgggtc 480 

agcctgggct tggtgcacat caccaatgca ggggtagctt tcctctgctt tctgggcact 540 
ttcctggtac aaagccag 558 



<210> 12 

<211> 186 

<212> PRT 

<213> Rattus sp 

<400> 12 
Val Leu Ser Leu 
1 

Ala Ala Leu Gly 
20 

Ala Ser Gly Gly 
35 

Phe Cys Leu Ser 
50 

Cys Leu Ala Gin 



Ser Thr Leu Phe 



Pro Leu Ser Trp 
100 

Ala Trp Leu Val 
115 

Ala Trp Tyr Leu 
130 



Leu Leu Leu Leu 
5 

Leu Phe Val His 



Ser Leu Phe Cys 

40 

Val Leu Leu Phe 
55 

Gin Pro Met Ala 
70 

Leu Gin Ala Ala 
85 

Ala Asn Trp Leu 



Val Leu Leu Ala 
120 

Met Ala Phe Pro 
135 



Cys Leu Val Leu 
10 

Tyr Trp Asp Ser 
25 

Phe Gly Leu lie 



Pro Gly Arg Pro 
60 

His Leu Pro Leu 
75 

Glu lie Phe Val 
90 

Cys Ser Tyr Leu 
105 

Thr Leu Val Glu 



Pro Glu Val Val 
140 



Gly Leu Thr Leu 
15 

Pro Leu Val Gin 
30 

Cys Leu Gly Leu 
45 

Arg Ser Ala Ser 



Thr Gly Cys Leu 
80 

Glu Ser Glu Leu 
95 

Arg Gly Pro Trp 
110 

Ala Ala Leu Cys 
125 

Thr Asp Trp Gin 



10 



Val Leu Pro Thr Glu Val Leu Glu 
145 150 

Ser Leu Gly Leu Val His lie Thr 
165 

Phe Leu Gly Thr Phe Leu Val Gin 
180 



His Cys Arg Met Arg Ser Trp Val 
155 160 

Asn Ala Gly Val Ala Phe Leu Cys 
170 175 

Ser Gin 
185 



<210> 13 

<211> 2577. 

<212> DNA 

<213> Rattus sp. 

<400> 13 

atgccgggtt tggctatctt gggcctcagt 
tcctctttgt gtctgtcaca gcaattcaag 
tttcccctgg gcacaactga ggaggccact 
ctatgtacca ggttctcgcc ccttggtttg 
gaggagatca acaatggatc tgccttgctc 
gacacatgct cagagccagt ggtcaccatg 
ggaagtcaaa gcattgctgc ctactgcaac 
gtcattggtc cccactcatc agagcttgcc 
ctcatgccac aggtcagcta tagtgccagc 
ccatccttct tccgcacagt gcccagtgac 
ttgcagaatt tcagctggaa ctgggtggct 
gaaggtctga gcatct tttc tggtctggcc 
ggcctggtgc cacaacatga cactagtggc 
cgccaagtga accaaagcaa agtacaggtg 
tactcccttt ttagctacag catccttcat 
gagtcctggc tgacctctga cctggtcatg 
gttcttgggt ttctgcagcg cggtgcccta 
cgccttgccc tagctgctga cccaacattc 
gaggagcgcg tgatggggcc acgctgttca 
tcatctgggc tgatgcagaa cctatcagct 
tatgcagctg tgtacagtgt ggctcaggcc 
cattgccaca catcagagcc tgttcaaccc 
agtttccgtg ctcgagactt gacactgcag 
tatgacctga agatgtgggt gtggcagagc 
ttcaacggca cccttcagct gcagcactcg 
gtctcccagt gctcccggca gtgcaaagat 
tcctgctgct atgactgtgt ggactgcaag 
ttcacctgta ctccatgtgg caaggatcag 
cctcgcaggc ccaagtttct ggcttggggg 
"ctt tgcctgg "tgcrgggcct" gacac tggct" 
agccctcttg ttcaggcctc aggtgggtca 
ctcttctgcc tcagtgtcct tctgttccca 
caacaaccaa tggctcacct ccctctcaca 
gccgagatct ttgtggagtc tgagctgcca 
cttcggggcc cctgggcttg gctggtggta 
tgtgcctggt acttgatggc tttccctcca 
acggaggtac tggaacactg ccgcatgcgt 
accaatgcag tgttagcttt cctctgcttt 
ggtcgctata accgtgcccg tggcctcacc 
gtctcttttg tgcccctcct ggctaatgtg 
ggtgctatct tattctgtgc cctgggcatc 



ctggctgctt tcctggagct tgggatgggg 60 
gcacaagggg actatatatt gggtggacta 120 
ctcaaccaga gaacacagcc caacggcatc 180 
ttcctggcca tggctatgaa gatggctgta 240 
cctgggctgc gactgggcta tgacctgttt 300 
aagcccagcc tcatgttcat ggccaaggtg 360 
tacacacagt accaaccccg tgtgctggct 420 
ctcattacag gcaagttctt cagcttcttc 480 
atggatcggc taagtgaccg ggaaacattt 540 
cgggtgcagc. tgcaggccgt tgtgacactg 600 
gccttaggta gtgatgatga ctatggccgg 660 
aactcacgag gtatctgcat tgcacacgag 720 
caacaattgg gcaaggtggt ggatgtgcta 780 
gtggtgctgt ttgcatctgc ccgtgctgtc 840 
gacctctcac ccaaggtatg ggtggccagt 900 
acacttccca atattgcccg tgtgggcact 960 
ctgcctgaat tttcccatta tgtggagact 1020 
tgtgcctccc tgaaagctga gttggatctg 1080 
caatgtgact acatcatgct acagaacctg 1140 
gggcagttgc accaccaaat atttgcaacc 1200 
cttcacaaca ccctgcagtg caatgtctca 1260 
tggcagctcc tggagaacat gtacaatatg 1320 
tttgatgcca aagggagtgt agacatggaa 1380 
cctacacctg tactacatac tgtaggcacc 1440 
aaaatgtatt ggccaggcaa ccaggtgcca 1500 
ggccaggtgc gcagagtaaa gggctttcat 1560 
gcagggagct accggaagca tccagatgac 1620 
tggtccccag aaaaaagcac aacctgctta 1680 
gagccagctg tgctgtcact tctcctgctg 1740 
"gcccCggggc ~t^EC£gec~ca " ctTactgggac TWO 
ctgttctgct ttggcctgat ctgcctaggc 1860 
ggacgaccac gctctgccag ctgccttgcc 1920 
ggctgcctga gcacactctt cctgcaagca 1980 
ctgagttggg caaactggct ctgcagctac 2040 
ctgctggcca ctcttgtgga ggctgcacta 2100 
gaggtggtga cagattggca ggtgctgccc 2160 
tcctgggtca gcctgggctt ggtgcacatc 2220 
ctgggcactt tcctggtaca gagccagcct 2280 
ttcgccatgc tagcttattt catcatctgg 2340 
caggtggcct accagccagc tgtgcagatg 2400 
ctggccacct tccacctgcc caaatgctat 2460 
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gtacttctgt ggctgccaga gctcaacacc caggagttct tcctgggaag gagccccaag 2520 
gaagcatcag atgggaatag tggtagtagt gaggcaactc ggggacacag tgaatga 2 577 

<210> 14 
<211> 858 
<212> PRT 
<213> Rattus sp. 

<400> 14 

Met Pro Gly Leu Ala lie Leu Gly Leu Ser Leu Ala Ala Phe Leu Glu 
15 10 15 

Leu Gly Met Gly Ser Ser Leu Cys Leu Ser Gin Gin Phe Lys Ala Gin 
20 v 25 30 

Gly Asp Tyr lie Leu Gly Gly Leu Phe Pro Leu Gly Thr Thr Glu Glu 
35 40 45 

Ala Thr Leu Asn Gin Arg Thr Gin Pro Asn Gly lie Leu Cys Thr Arg 
50 55 60 

Phe Ser Pro Leu Gly Leu Phe Leu Ala Met Ala Met Lys Met Ala Val 
65 70 75 80 

Glu Glu lie Asn Asn Gly Ser Ala Leu Leu Pro Gly Leu Arg Leu Gly 
85 90 * 95 

Tyr Asp Leu Phe Asp Thr Cys Ser Glu Pro Val Val Thr Met Lys Pro 
100 105 110 

Ser Leu Met Phe Met Ala Lys Val Gly Ser Gin Ser He Ala Ala Tyr 
115 120 125 

Cys Asn Tyr Thr Gin Tyr Gin Pro Arg Val Leu Ala Val He Gly Pro 
130 135 140 

His Ser Ser Glu Leu Ala Leu He Thr Gly Lys Phe Phe Ser Phe Phe 
145 150 155 160 

Leu Met Pro Gin Val Ser Tyr Ser Ala Ser Met Asp Arg Leu Ser Asp 
165 170 ~ ~ 175 

Arg Glu Thr Phe Pro Ser Phe Phe Arg Thr Val Pro Ser Asp Arg Val 
180 185 190 

Gin Leu Gin Ala Val Val Thr Leu Leu Gin "Asn Phe Ser Trp Asn Trp 
195 200 205 

Val Ala Ala Leu Gly Ser Asp Asp Asp Tyr Gly Arg Glu Gly Leu Ser 
210 215 220 

He Phe Ser Gly Leu Ala Asn Ser Arg Gly He Cys He Ala His Glu 
225 230 ~ " 235 240 

Gly Leu Val Pro Gin His Asp Thr Ser Gly Gin Gin Leu Gly Lys Val 
245 250 255 



') 
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Val Asp Val Leu Arg Gin Val Asn Gin Ser Lys Val Gin Val Val Val 
260 265 270 

Leu Phe Ala Ser Ala Arg Ala Val Tyr Ser Leu Phe Ser Tyr Ser lie 
275 280 285 

Leu His Asp Leu Ser Pro Lys Val Trp Val Ala Ser Glu Ser Trp Leu 
290 295 300 

Thr Ser Asp Leu Val Met Thr Leu Pro Asn lie Ala Arg Val Gly Thr 
305 310 315 ~ 320 

Val Leu Gly Phe Leu Gin Arg Gly Ala Leu Leu Pro Glu Phe Ser His 
325 330 335 

Tyr Val Glu Thr Arg Leu Ala Leu Ala Ala Asp Pro Thr Phe Cys Ala 
340 345 350 

Ser Leu Lys Ala Glu Leu Asp Leu Glu Glu Arg Val Met Gly Pro Arg 
355 360 ' 365 

Cys Ser Gin Cys Asp Tyr He Met Leu Gin Asn Leu Ser Ser Gly Leu 
370 375 380 

Met Gin Asn Leu Ser Ala Gly Gin Leu His His Gin He Phe Ala Thr 
385 390 395 400 

Tyr Ala Ala Val Tyr Ser Val Ala Gin Ala Leu His Asn Thr Leu Gin 
405 410 415 

Cys Asn Val Ser His Cys His Thr Ser Glu Pro Val Gin Pro Trp Gin 
420 425 430 

Leu Leu Glu Asn Met Tyr Asn Met Ser Phe Arg Ala Arg Asp Leu Thr 
435 440 445 

Leu Gin Phe Asp Ala Lys Gly Ser Val Asp Met Glu Tyr Asp Leu Lys 
450 455 460 

Met Trp Val Trp Gin Ser Pro Thr Pro Val Leu His Thr Val Gly Thr 
465 470 475 480 

Phe Asn Gly Thr Leu Gin Leu Gin His Ser Lys Met Tyr Trp Pro Gly 
485 490 " 495 

_ Asn Gin ^Val Pro Val Ser Gin Cys Ser Arg Gin Cys Lys Asp Gly Gin 
500 505 " " ~ 510 

Val Arg Arg Val Lys Gly Phe His Ser Cys Cys Tyr Asp Cys Val Asp 
515 520 525 

Cys Lys Ala Gly Ser Tyr Arg Lys His Pro Asp Asp Phe Thr Cys Thr 
530 535 540 

Pro Cys Gly Lys Asp Gin Trp Ser Pro Glu Lys Ser Thr Thr Cys Leu 
545 550 555 560 



, ) . ) 
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Pro Arg Arg Pro Lys Phe Leu Ala Trp Gly Glu Pro Ala Val Leu Ser 
565 570 575 

Leu Leu Leu Leu Leu Cys Leu Val Leu Gly Leu Thr Leu Ala Ala Leu 
580 585 590 

Gly Leu Phe Val His Tyr Trp Asp Ser Pro Leu Val Gin Ala Ser Gly 
595 600 605 

Gly Ser Leu Phe Cys Phe Gly Leu lie Cys Leu Gly Leu Phe Cys Leu 
610 615 ^ 620 

Ser Val Leu Leu Phe Pro Gly Arg Pro Arg Ser Ala Ser Cys Leu Ala 
625 630 635 "* 640 

Gin Gin Pro Met Ala His Leu Pro Leu Thr Gly Cys Leu Ser Thr Leu 
645 650 * 655 

Phe Leu Gin Ala Ala Glu lie Phe Val Glu Ser Glu Leu Pro Leu Ser 
660 665 670 

Trp Ala Asn Trp Leu Cys Ser Tyr Leu Arg Gly Pro Trp Ala Trp Leu 
675 680 685 

Val Val Leu Leu Ala Thr Leu Val Glu Ala Ala Leu Cys Ala Trp Tyr 
690 695 700 

Leu Met Ala Phe Pro Pro Glu Val Val Thr Asp Trp Gin Val Leu Pro 
705 710 715 J 720 

Thr Glu Val Leu Glu His Cys Arg Met Arg Ser Trp Val Ser Leu Gly 
725 730 735 

Leu Val His He Thr Asn Ala Val Leu Ala Phe Leu Cys Phe Leu Gly 
740 745 750 

Thr Phe Leu Val Gin Ser Gin Pro Gly Arg Tyr Asn Arg Ala Arg Gly 
755 760 ~ 765 

Leu Thr Phe Ala Met Leu Ala Tyr Phe He He Trp Val Ser Phe Val 
770 775 780 

Pro Leu Leu Ala Asn Val Gin Val Ala Tyr Gin Pro Ala Val Gin Met 
785 790 795 800 

Gly Ala He Leu Phe Cys Ala Leu Gly He Leu Ala Thr Phe His Leu 
805 " 810 815 

Pro Lys Cys Tyr Val Leu Leu Trp Leu Pro Glu Leu Asn Thr Gin Glu 
820 825 830 

Phe Phe Leu Gly Arg Ser Pro Lys Glu Ala Ser Asp Gly Asn Ser Gly 
835 840 845 

Ser Ser Glu Ala Thr Arg Gly His Ser Glu 
850 855 



) 
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<210> 15 
<211> 8194 
<212> DNA 

<213> Homo sapiens 
<220> 

<221> modif ied_base 

<222> (1251) . . (1300) 

<223>a, t, c, g, other or unknown 

<220> 

<221> modif ied_base 

<222> (1951) . . (2000) 

<223> a, t, c, g, other or unknown 

<400> 15 

gagaatctcg cgagatcccg tcggtccgcc ccgctgccct cccagctgcc gaaaagaggg 60 
gcctccgagc cgccggcgcc ctctgccggc aacctccgga agcacactag gaggttccag 120 
ccgatctggt cgaggggctc cacggaggac tccatttacg ttacgcaaat tccctacccc 180 
agccggccgg agagagaaag ccagaaacct cgcgaccagc catgggccac ctctccggaa 240 
aaacaccggg atattttttt tctcctgcag aaaaagcttt aggattggca gtttaaacaa 300 
aacatgtcta tttgcatacc ttcggtttgc atgcatttgt ttcgaagtga gcaaccctgg 360 
gtaacaaggc gaaagtatat gacaatttgc tcagaatctt aatgtcagaa aactggagac 420 
tggggcaggg gggtgtcgac tcaaagctgt gtctcattta gtaaactgag gcccaggtaa 480 
aaagttctga aacctcgcaa cacccggaga aattgtgttc cagcctccca cctcgcccca 540 
aaatgccaga gctccttttc taagccaggt gaagtcacag agcgtggaca gaacccacaa 600 
ccgtccagag gaagggtcac tgggtgccac ctggtttgca tctgtgcctt cgtcctgccc 660 
agttcctgag tgggaccgca ggcccggaat gtcaaggcaa acagtcctgc ttcagccact 720 
gggctccagt cccacccctt ttgggggcct gaagttagga agcatccggc agctgccttc 780 
tatttaagca actggcctcc ttagaggcca ctccttggcc atgccaggcg cgggcatctg 840 
gccagcatgc tgctctgcac ggctcgcctg gtcggcctgc agcttctcat ttcctgctgc 900 
tgggcctttg cctgccatag cacggagtct tctcctgact tcaccctccc cggagattac 960 
ctcctggcag gcctgttccc tctccattct ggctgtctgc aggtgaggca cagacccgag 1020 
gtgaccctgt gtgacaggtg agtgaggggc cagcagagcc acacttagtg ggacccctgg 1080 
ctatagggcc cctctggctg ccatcctcca aacaggacct tgcctctgcc tttgcccctt 1140 
gaactgtccc caggccttgt tcatcaatcc acttgccacc taagtgctgg ctagaccttc 1200 
ctagacactt cggccagttt ccaattattt cacccttgct gttagaatgt nnnnnnnnnn 1260 
nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn aattccttaa actaaatttc 1320 
tcactttctc tctctctctg gaaaacactg actaatgtag caggtttctc tgctccagga 1380 
cttcaggacc ttttcgatgc taataagttt ctccatcagg gccagcttgt tcctcctact 1440 
gagcttgaga gcccttgttg aagttgtggt ttgggggact ggaccgatga cctcaaaggt 1500 
tccctttgct cccaagcctc agagtctagg aggccagagg gtctcagcag gcctttgtcc 1560 
ttctcagctg tctcttactg gctttctcca caggtcttgt agcttcaatg agcatggcta 1620 
ccacctcttc caggctatgc ggcttggggt tgaggagata aacaactcca cggccctgct 1680 
gcccaacatc accctggggt accagctgta tgatgtgtgt tctgactctg ccaatgtgta 1740 
tgccacgctg agagtgctct ccctgccagg gcaacaccac atagagctcc aaggagacct 1800 
tctccactat tcccctacgg tgctggcagt gattgggcct gacagcacca accgtgctgc 1860 
caccacagcc gccctgctga gccctttcct ggtgcccatg gtaagctgga gcctcagacc 1920 
tttgcccatc tcccttcagg caagtctggg nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 1980 
nnnnnnnnnn nnnnnnnnnn gccaccatgc ccggctaatt tttttgtatt tttagtagag 2040 
acggggtttc accgtgttag ccaggctggt cgcaaactcc taacctcgtg atccacccac 2100 
ctcggcctcc caatgtgctg ggattacagg tgtgagccac tgcacccggc cataatgtat 2160 
taatataata aaataattat acaactcacc ataatgtaga atcagtggga gccctgagct 2220 
tgttttccta caactagatg gtcccatctg ggggtgatgg gagacagtga cagatcatca 2280 
gacattagat tctcataagt agcgtgcaac ccagatccct cgcatgtgca gttcacagta 2340 
gggttcaagc tcctacaaga atctgatgct gctgctgatc tgacaggagg ggagcagctg 2400 
taaatacaga tgaagcttcg cttactcacc agctgctcac ctcctcctgt gaggcccggt 2460 
tcctaacagg ccactgacct aacttctgcc ctgacctaca catgcttctc ttcttccttg 2520 
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caaactgcct ccagtggaag tccctgaagg tccccaaaca cacgggacta tttcactcct 2580 
atgcaggttt tgtctccttt gcttggaatg catcccctca ccccttgtcc ccaggcagat 2640 
tcccacccct cccccagaac ctgccccagt ggagccttcg caggtgattt gtcagtttca 2700 
caggctgagg ggtgctctcc tggtctcccc ggctccctgt atccccacac ccagcacagg 2760 
gccaggcact gggggggcct tcagtggaga ctgaaatggc tgaacgggac ctcccataga 2820 
ttagctatgc ggccagcagc gagacgctca gcgtgaagcg gcagtatccc tctttcctgc 2880 
gcaccatccc caatgacaag taccaggtgg agaccatggt gctgctgctg cagaagttcg 2940 
ggtggacctg gatctctctg gttggcagca gtgacgacta tgggcagcta ggggtgcagg 3000 
cactggagaa ccaggccact ggtcagggga tctgcattgc tttcaaggac atcatgccct 3 060 
tctctgccca ggtgggcgat gagaggatgc agtgcctcat gcgccacctg gcccaggccg 3120 
gggccaccgt cgtggttgtt ttttccagcc ggcagttggc cagggtgttt ttcgagtccg 3180 
tggtgctgac caacctgact ggcaaggtgt gggtcgcctc agaagcctgg gccctctcca 3240 
ggcacatcac tggggtgccc gggatccagc gcattgggat ggtgctgggc gtggccatcc 3300 
agaagagggc tgtccctggc ctgaaggcgt ttgaagaagc ctatgcccgg gcagacaaga 3360 
aggcccctag gccttgccac aagggctcct ggtgcagcag caatcagctc tgcagagaat 3420 
gccaagcttt catggcacac acgatgccca agctcaaagc cttctccatg agttctgcct 3480 
acaacgcata ccgggctgtg tatgcggtgg cccatggcct ccaccagctc ctgggctgtg 3540 
cctctggagc ttgttccagg ggccgagtct acccctggca ggtaagagag cccaccccag 3600 
cacctcctgt cagggagaac agccaatcct gagatgagca gagtgggcac tctccggtca 3660 
ctctaaatgc caagggggat aaatgccact aacttgaggt tttttgtttt gttttgtttt 3720 
gttttttgag acagtctggc tctgtcaccc aggctgcagt gtagtgatgc gatctcggct 3780 
ctctgcaact tccacctcct gggttcaagt gattctcttg cctcggcctc ctgagtagct 3840 
gggattacag gcacccacca ccatgcctgg ataatttttc ttttcttttt tttttttttg 3900 
agatagagtc tcgctctgtt gcccaggctg gaatgcagtg gtgcgatctt ggctcactgt 3 960 
gagctccgcc tcccaggttc actccattcc cctgcctcag cctcccaagt aggtgggact 4020 
acgggcgccc gccaccacgc ccagctaatt ttttttgtat tttgagtaga gacggggttt 4080 
caccatgtta gccaggatgg tctcaatctc ctgaccttgt catccgccca cctcgtcctc 4140 
ccaaagtgct gggattacag gcgtgagcca ccgcacccgg cctaattttt gtatttttag 4200 
tagagatggg gtttcaccat gttggccagg ctggtctcga actcctggca tcaagtgatc 4260 
ctcctgcttc ggcctcccaa agtgctggga ttacaggcat tagctctctt ctcttagaca 4320 
gatctttctc tctgatcctt gccttctctc acccactgtg tcttggaagt gtcaagtgat 4380 
aagatccagg gctaaaactg tctgtaaagg agtgtttgtt agaggcctcc tctcaggagg 4440 
ttggtgggga agattgaggg gcttcctaag aaggaaggga cgagaccttc ctgatgggct 4500 
gaaaccacca ggacggaaac ccaggaaggc cccaggccct tgcttctggg accatgtggg 4560 
tctgtgctgt ctgtggtggc ttcatgatac gcgtttcttt cagcttttgg agcagatcca 4620 
caaggtgcat ttccttctac acaaggacac tgtggcgttt aatgacaaca gagatcccct 4680 
cagtagctat aacataattg cctgggactg gaatggaccc aagtggacct tcacggtcct 4740 
cggttcctcc acatggtctc cagttcagct aaacataaat gagaccaaaa tccagtggca 4800 
cggaaaggac aaccaggtaa tggggatgtg gctactcacc atgtaactgg cttatgggca 4860 
acctagagcc tgggggtgat gctgacacag tgtacaggga gcaggagggg ggccccaggg 4 920 
gtccagctgc caccactcta cccatcctgg ccagggaagc agggaagaca ctccgtaggc 4980 
gagtgtgcag atgccctggg gcggaagttc acacgaccag gggccctgcc ctgggagtga 5040 
gccctgaggg cagatgcaca gagattctgt tttctgttcc acatgtgagc tgtcctttga 5100 
cttgggcccc tacgtgtggc ccctctggct tcttacaggt gcctaagtct gtgtgttcca 5160 
gcgactgtct tgaagggcac cagcgagtgg ttacgggttt ccatcactgc tgctttgagt 5220 
gtgtgccctg tggggctggg accttcctca acaagagtgg tgagtgggca atggagcagg 5280 
cgagctaccc agcactcccg ggggctgcac ggtggaggga gggcctccct tgggccccat 5340 
gtgccctgcc ccagaaccaa ggcccagtca ctgggctgcc agttagcttc aggttggagg 5400 
acacctgcta ccagacagaa ttctgatcaa gagaatcagc cactgggtgc ggtggctcat 5460 
gcctgtaatc ccagcacttt gggaggctga ggcgggtgga tcacttgagg tcgggagttc 5520 
gagaccagcc tggccaacat ggtgaaaccc catctctacc aaaaatataa aaaattagct 5580 
gggtgtggtg gcgcgtgcct gtaatcccag ctactcggga ggctgaggca ggagaatcac 5640 
ttgaacccag gaggcggagg ttgcagtgag ccaagatgca ttccagcctg gaccacaaag 5700 
cgagaattcg tccccccaaa aaaagaaagg aggccgggcg cggtggctca cacctgtaat 5760 
cccagcactt tgggaggccg aggtgggtgg atcacctgag gtcaggagtt cgagaccagc 5820 
ctgaccaaca tggtgaaacc ccatctctac taaaaataca aaaaaagtta gccgggcgtt 5880 
gtggcgtgtg cctgtaattc cagctactcg ggaggctgag gcaggagaat tgcttgaacc 5940 
cgggaggcgg aggttgcagt gagccaagat tgcaccattg cactccagcc tgggcgacaa 6000 
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gagaaaaact ctgtctcaaa aaaaaagaaa gaaagaaaga attagccaac tgaaagcctt 6060 
agactgaggt gtgtcctctg ttagagagct gtcatcacaa ctcctacaaa agcagtcgta 6120 
tcctgaattc aacctctttc tctaaatgaa tatagctatt gttccctttg tgccctcttg 6180 
tcctactgtc ccttctgttg cccatgccaa agacagctag ctccttgaac agcttggcct 6240 
gaatacagat actagcgtgt ctgcagcaga gaaaaaaaca gcattcccca tccagaaatg 6300 
caaggtcaag aacagagagc aaattaggta gctaaggact caggtcctta gttggtgtcc 6360 
aggggccaca ttctttcctt tcaccatctc tgtagggaca ggaatacttc ccttctgtcc 6420 
tcagagggtc aggactcaga gaaaccacag agcagcagct caggaaagtg gttcatggaa 6480 
atgctggcaa gagagagggg ttacaatgcc ctcccttggg agcaggctgc tcccatcaga 6540 
tcgtaacctc tctggtatgt gggcagagct accaggttaa ggtcctccct agggtttgca 6600 
aaaccctcat gggatcatga gccatacaga accgacctgt gtgtctccag agtctgtaat 6660 
taacacaggc attttgagga aatgcgtggc ctcaggcccc actcccggct acccccatcc 6720 
cactatgcct agtatagtct agctgccctg gtacaattct cccagtatct tgcaggcccc 6780 
tatttcctat tcctactctg ctcatctggc tctcaggaac cttcttggcc ttccctttca 6840 
gacctctaca gatgccagcc ttgtgggaaa gaagagtggg cacctgaggg aagccagacc 6900 
tgcttcccgc gcactgtggt gtttttggct ttgcgtgagc acacctcttg ggtgctgctg 6960 
gcagctaaca cgctgctgct gctgctgctg cttgggactg ctggcctgtt tgcctggcac 7020 
ctagacaccc ctgtggtgag gtcagcaggg ggccgcctgt gctttcttat gctgggctcc 7080 
ctggcagcag gtagtggcag cctctatggc ttctttgggg aacccacaag gcctgcgtgc 7140 
ttgctacgcc aggccctctt tgcccttggt ttcaccatct tcctgtcctg cctgacagtt 7200 
cgctcattcc aactaatcat catcttcaag ttttccacca aggtacctac attctaccac 7260 
gcctgggtcc aaaaccacgg tgctggcctg tttgtgatga tcagctcagc ggcccagctg 7320 
cttatctgtc taacttggct ggtggtgtgg accccactgc ctgctaggga ataccagcgc 7380 
ttcccccatc tggtgatgct tgagtgcaca gagaccaact ccctgggctt catactggcc 7440 
ttcctctaca atggcctcct ctccatcagt gcctttgcct gcagctacct gggtaaggac 7500 
ttgccagaga actacaacga ggccaaatgt gtcaccttca gcctgctctt caacttcgtg 7560 
tcctggatcg ccttcttcac cacggccagc gtctacgacg gcaagtacct gcctgcggcc 7620 
aacatgatgg ctgggctgag cagcctgagc agcggcttcg gtgggtattt tctgcctaag 7680 
tgctacgtga tcctctgccg cccagacctc aacagcacag agcacttcca ggcctccatt 7740 
caggactaca cgaggcgctg cggctccacc tgaccagtgg gtcagcaggc acggctggca 7800 
gccttctctg ccctgagggt cgaaggtcga gcaggccggg ggtgtccggg aggtctttgg 7860 
gcatcgcggt ctggggttgg gacgtgtaag cgcctgggag agcctagacc aggctccggg 7920 
ctgccaataa agaagtgaaa tgcgtatctg gtctcctgtc gtgggagagt gtgaggtgta 7980 
acggattcaa gtctgaaccc agagcctgga aaaggctgac cgcccagatt gacgttgcta 8040 
ggcaactccg gaggcgggcc cagcgccaaa agaacagggc gaggcgtcgt ccccgcatcc 8100 
cattggccgt tctctgcggg gccccgccct cgggggccgg agctagaagc tctacgcttc 8160 
cgaggcgcac ctcctggcct gcacgctttg acgt 8194 



<210> 16 
<211> 2526 
<212> DNA 

<213> Homo sapiens 
<400> 16 

atgctgctct gcacggctcg cctggtcggc ctgcagcttc tcatttcctg ctgctgggcc 60 
tttgcctgcc atagcacgga gtcttctcct gacttcaccc tccccggaga ttacctcctg 120 
gcaggcctgt tccctctcca ttctggctgt ctgcaggtga ggcacagacc cgaggtgacc 180 
ctgtgtgaca ggtcttgtag cttcaatgag catggctacc acctcttcca ggctatgcgg 240 
cttggggttg aggagataaa caactccacg gccctgctgc ccaacatcac cctggggtac 300 
cagctgtatg atgtgtgttc tgactctgcc aatgtgtatg ccacgctgag agtgctctcc 360 
ctgccagggc aacaccacat agagctccaa ggagaccttc tccactattc ccctacggtg 420 
ctggcagtga ttgggcctga cagcaccaac cgtgctgcca ccacagccgc cctgctgagc 480 
cctttcctgg tgcccatgat tagctatgcg gccagcagcg agacgctcag cgtgaagcgg 540 
cagtatccct ctttcctgcg caccatcccc aatgacaagt accaggtgga gaccatggtg 600 
ctgctgctgc agaagttcgg gtggacctgg atctctctgg ttggcagcag tgacgactat 660 
gggcagctag gggtgcaggc actggagaac caggccactg gtcaggggat ctgcattgct 720 
ttcaaggaca tcatgccctt ctctgcccag gtgggcgatg agaggatgca gtgcctcatg 780 
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cgccacctgg 

agggtgtttt 

gaagcctggg 

gtgctgggcg 

tatgcccggg 

aatcagctct 

ttctccatga 

caccagctcc 

cttttggagc 

gacaacagag 

tggaccttca 

accaaaatcc 

tgtcttgaag. 

ccctgtgggg 

aaagaagagt 

gctttgcgtg 

ctgcttggga 

99999 cc 9cc 

ggcttctttg 

ggtttcacca 

aagttttcca 

ctgtttgtga 

tggaccccac 

acagagacca 

agtgcctttg 

tgtgtcacct 

agcgtctacg 

agcagcggct 

ctcaacagca 

acctga 



cccaggccgg 
tcgagtccgt 
ccctctccag 
tggccatcca 
cagacaagaa 
gcagagaatg 
gttctgccta 

tgggctgtgc 

agatccacaa 
atcccctcag 
cggtcctcgg 
agtggcacgg 
ggcaccagcg 
ctgggacctt 
gggcacctga 
agcacacctc 
ctgctggcct 
tgtgctttct 
gggaacccac 
tcttcctgtc 
ccaaggtacc 
tgatcagctc 
tgcctgctag 
actccctggg 
cctgcagcta 
tcagcctgct 
acggcaagta 
tcggtgggta 
cagagcactt 



ggccaccgtc 
ggtgctgacc 
gcacatcact 
gaagagggct 
ggcccctagg 
ccaagctttc 
caacgcatac 
ctctggagct 
ggtgcatttc 
tagctataac 
ttcctccaca 
aaaggacaac 
agtggttacg 
cctcaacaag 
gggaagccag 
ttgggtgctg 
gtttgcctgg 
tatgctgggc 
aaggcctgcg 
ctgcctgaca 
tacattctac 
agcggcccag 
ggaataccag 
cttcatactg 
cctgggtaag 
cttcaacttc 
cctgcctgcg 
ttttctgcct 
ccaggcctcc 



gtggttgttt 
aacctgactg 
9999tgcccg 
gtccctggcc 
ccttgccaca 
atggcacaca 
cgggctgtgt 
tgttccaggg 
cttctacaca 
ataattgcct 
tggtctccag 
caggtgccta 
ggtttccatc 
agtgacctct 
acctgcttcc 
ctggcagcta 
cacctagaca 
tccctggcag 
tgcttgctac 
gttcgctcat 
cacgcctggg 
ctgcttatct 
cgcttccccc 
gccttcctct 
gacttgccag 
gtgtcctgga 
gccaacatga 
aagtgctacg 
attcaggact 



tttccagccg 
gcaaggtgtg 
ggatccagcg 
tgaaggcgtt 

a 999 ctcct 9 
cgatgcccaa 
atgcggtggc 
gccgagtcta 
aggacactgt 
gggactggaa 
ttcagctaaa 
agtctgtgtg 
actgctgctt 
acagatgcca 
cgcgcactgt 
acacgctgct 
cccctgtggt 
caggtagtgg 
gccaggccct 
tccaactaat 
tccaaaacca 
gtctaacttg 
atctggtgat 
acaatggcct 
agaactacaa 
tcgccttctt 
tggctgggct 
tgatcctctg 
acacgaggcg 



gcagttggcc 
ggtcgcctca 
cattgggatg 
tgaagaagcc 
gtgcagcagc 
gctcaaagcc 
ccatggcctc 
cccctggcag 
ggcgtttaat 
tggacccaag 
cataaatgag 
ttccagcgac 
tgagtgtgtg 
gccttgtggg 
ggtgtttttg 
gctgctgctg 
gaggtcagca 
cagcctctat 
ctttgccctt 
catcatcttc 
cggtgctggc 
gctggtggtg 
gcttgagtgc 
cctctccatc 
cgaggccaaa 
caccacggcc 
gagcagcctg 
ccgcccagac 
ctgcggctcc 



840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2526 



<210> 17 
<211> 841 
<212> PRT 

<213> Homo sapiens 



<400> 17 
Met Leu Leu Cys 
1 

Cys Cys Trp Ala 
20 

Thr Leu Pro Gly 
35 

Gly Cys Leu Gin 
50 

Ser Cys Ser Phe 
65 

Leu Gly Val Glu 



Thr Leu Gly Tyr 
100 



Thr Ala Arg Leu 
5 

Phe Ala Cys His 



Asp Tyr Leu Leu 
40 

Val Arg His Arg 

55 

Asn Glu His Gly 
70 

Glu lie Asn Asn 
85 

Gin Leu Tyr Asp 



Val Gly Leu Gin 
10 

Ser Thr Glu Ser 
25 

Ala Gly Leu Phe 



Pro Glu Val Thr 
60 

Tyr His Leu Phe 
75 

Ser Thr Ala Leu 
90 

Val Cys Ser Asp 
105 



Leu Leu lie Ser 
15 

Ser Pro Asp Phe 
30 

Pro Leu His Ser 
45 

Leu Cys Asp Arg 



Gin Ala Met Arg 
80 

Leu Pro Asn lie 
95 

Ser Ala Asn Val 
110 
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Tyr Ala Thr Leu Arg Val Leu Ser Leu Pro Gly Gin His His lie Glu 
115 120 125 

Leu Gin Gly Asp Leu Leu His Tyr Ser Pro Thr Val Leu Ala Val lie 
X3 ° 135 140 

Gly Pro Asp Ser Thr Asn Arg Ala Ala Thr Thr Ala Ala Leu Leu Ser 
145 150 155 i 6 o 

Pro Phe Leu Val Pro Met He Ser Tyr Ala Ala Ser Ser Glu Thr Leu 
I 65 170 175 

Ser Val Lys Arg Gin Tyr Pro Ser Phe Leu Arg Thr He Pro Asn Asp 
180 i 8 5 19Q 

Lys Tyr Gin Val Glu Thr Met Val Leu Leu Leu Gin Lys Phe Gly Tro 
195 200 205 

Thr Trp He Ser Leu Val Gly Ser Ser Asp Asp Tyr Gly Gin Leu Gly 
210 215 220 

Val Gin Ala Leu Glu Asn Gin Ala Thr Gly Gin Gly He Cys He Ala 
225 230 235 240 

Phe Lys Asp He Met Pro Phe Ser Ala Gin Val Gly Asp Glu Arg Met 
245 250 255 

Gin Cys Leu Met Arg His Leu Ala Gin Ala Gly Ala Thr Val Val Val 
260 265 270 

Val Phe Ser Ser Arg Gin Leu Ala Arg Val Phe Phe Glu Ser Val Val 



275 



280 



285 



oo« LSU Thr GlY LyS Val Tr P Val Ala Ser Glu Ala Trp Ala 

290 295 300 

Leu Ser Arg His He Thr Gly Val Pro Gly lie Gin Arg He Gly Met 
305 3X0 315 320 

Val Leu Gly Val Ala He Gin Lys Arg Ala Val Pro Gly Leu Lys Ala 
325 330 335 

Phe Glu Glu Ala Tyr Ala Arg Ala Asp Lys Lys Ala Pro Arg Pro Cys 
340 345 350 

His Lys Gly Ser Trp Cys Ser Ser Asn Gin Leu Cys Arg Glu Cys Gin 
355 360 365 

Ala Phe Met Ala His Thr Met Pro Lys Leu Lys Ala Phe Ser Met Ser 
370 375 38O 

Ser Ala Tyr Asn Ala Tyr Arg Ala Val Tyr Ala Val Ala His Gly Leu 
385 390 395 400 

His Gin Leu Leu Gly Cys Ala Ser Gly Ala Cys Ser Arg Gly Arg Val 
405 410 415 
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Tyr Pro Trp Gin Leu Leu Glu Gin lie His Lys Val His Phe Leu Leu 
420 425 430 

His Lys Asp Thr Val Ala Phe Asn Asp Asn Arg Asp Pro Leu Ser Ser 
435 440 445 

Tyr Asn lie lie Ala Trp Asp Trp Asn Gly Pro Lys Trp Thr Phe Thr 
450 455 460 

Val Leu Gly Ser Ser Thr Trp Ser Pro Val Gin Leu Asn He Asn Glu 
465 470 475 480 

Thr Lys He Gin Trp His Gly Lys Asp Asn Gin Val Pro x Lys Ser Val 
485 490 ~ 495 

Cys Ser Ser Asp Cys Leu Glu Gly His Gin Arg Val Val Thr Gly Phe 
500 505 510 

His His Cys Cys Phe Glu Cys Val Pro Cys Gly Ala Gly Thr Phe Leu 
515 520 525 

Asn Lys Ser Asp Leu Tyr Arg Cys Gin Pro Cys Gly Lys Glu Glu Trp 
530 535 ' 540 

Ala Pro Glu Gly Ser Gin Thr Cys Phe Pro' Arg Thr Val Val Phe Leu 
545 550 555 560 

Ala Leu Arg Glu His Thr Ser Trp Val Leu Leu Ala Ala Asn Thr Leu 
565 570 575 

Leu Leu Leu Leu Leu Leu Gly Thr Ala Gly Leu Phe Ala Trp His Leu 
580 585 590 

Asp Thr Pro Val Val Arg Ser Ala Gly Gly Arg Leu Cys Phe Leu Met 
595 600 605 

Leu Gly Ser Leu Ala Ala Gly Ser Gly Ser Leu Tyr Gly Phe Phe Gly 
610 615 620 

Glu Pro Thr Arg Pro Ala Cys Leu Leu Arg Gin Ala Leu Phe Ala Leu 
625 630 635 640 

Gly Phe Thr He Phe Leu Ser Cys Leu Thr Val Arg Ser Phe Gin Leu 
645 650 655 

He He He Phe Lys Phe Ser Thr Lys Val Pro Thr Phe Tyr His Ala 
660 665 670 

Trp Val Gin Asn His Gly Ala Gly Leu Phe Val Met He Ser Ser Ala 
675 680 685 

Ala Gin Leu Leu He Cys Leu Thr Trp Leu Val Val Trp Thr Pro Leu 
690 695 700 

Pro Ala Arg Glu Tyr Gin Arg Phe Pro His Leu Val Met Leu Glu Cys 
705 710 715 720 



i 



Thr Glu Thr Asn 



Leu Leu Ser lie 
740 

Pro Glu Asn Tyr 
755 

Asn Phe Val Ser 
770 

Gly Lys Tyr Leu 
785 

Ser Ser Gly Phe 



Cys Arg Pro Asp 
820 

Asp Tyr Thr Arg 
835 



Ser Leu Gly Phe 
725 

Ser Ala Phe Ala 



Asn Glu Ala Lys 
760 

Trp lie Ala Phe 
775 

Pro Ala Ala Asn 
790 

Gly Gly Tyr Phe 
805 

Leu Asn Ser Thr 



Arg Cys Gly Ser 
840 
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lie Leu Ala Phe 
730 

Cys Ser Tyr Leu 
745 

Cys Val Thr Phe 



Phe Thr Thr Ala 
780 

Met Met Ala Gly 
795 

Leu Pro Lys Cys 
810 

Glu His Phe Gin 
825 

Thr 



Leu Tyr Asn Gly 
735 

Gly Lys Asp Leu 
750 

Ser Leu Leu Phe 
765 

Ser Val Tyr Asp 



Leu Ser Ser Leu 
800 

Tyr Val He Leu 
815 

Ala Ser He Gin 
830 



<210> 18 
<211> 14 
<212> PRT 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Consensus 
sequence 

<220> 

<221> MOD_RES *v 

<222> (1) 

<223> Thr or Arg 



<220> 

<221> MOD_RES 

<222> (3) 

<223> Phe or Leu 



<220> 

<221> MOD_ 
<222> (4) 
<223> Arg, 

<220> 

<221> MOD_ 
<222> (6) 
<223> Arg 

<220> 

<221> MOD_ 

<222> (7) 

<223> Ser, 



RES 
Gin or Pro 

RES 

or Thr 

RES 
Pro or Val 



• l 1 
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<220> 

<221> MOD_RES 
<222> (8) 

<223> Val, Glu, Arg, Lys or Thr 
<220> 

<2 21> MOD_RES 

<222> (11) 

<223> Ala or Glu 

<220> 

<221> MOD_RES 

<222> (12) 

<223> Trp or Leu 

<220> 

<221> MOD_RES 
<222> (13) 

<223> Arg, His or Gly 

<400> 18 : 

Xaa Cys Xaa Xaa Arg Xaa Xaa Xaa Phe Leu Xaa Xaa Xaa Glu 
15 10 



<210> 19 
<211> 15 
<212> PRT 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Consensus 
sequence 

<220> 

<221> MOD_RES 

<222> (1) 

<223> Leu or Gin 

<220> 

<221> MOD_RES ^ 
<222> (3) 

<223> Glu, Gly or Thr 
<220> 

<221> MOD_RES 
<222> (4) 

<223> Asn, Arg or Cys 
<220> 

<221> MOD_RES 

<222> (7) 

<223> Arg or Glu 

<220> 

<221> MOD_RES 
<222> (9) 
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<223> Arg or Lys 
<220> 

<221> MOD_RES 
<222> (10) 

<223> Cys, Gly or Phe 
<220> 

<221> MOD_RES 
<222> (11) 

<223> Val, Leu or lie 
<220> 

<221> MOD_RES 

<222> (13) 

<223> Phe or Leu 

<220> 

<221> MOD__RES 

<222> (14) 

<223> Ala or Ser 

<220> 

<221> MOD_RES 

<222> (15) 

<223> Met or Leu 

<400> 19 

Xaa Pro Xaa Xaa Tyr Asn Xaa Ala Xaa Xaa Xaa Thr Xaa Xaa Xaa 
15 10 15 



<210> 20 

<211> 3563 

<212> DNA 

<213> Homo sapiens 



<400> 20 

agcctggcag 

ggacaccact 

tcctctgccc 

ctgccgtgcc 

ctctgggctc 

atgaaggggg 

ctccgcagcc 

tgggtcgggg 

ctgcggttct 

aaatggccgt 

acgacctctt 

tggccaaggc 

gtgtgctggc 

tcagcttctt 

cctgccccgt 

cctgggagcc 

ggagctgctg 

tgtgcagctg 

cctgggcagc 

ggcacgcggc 



tggcctcagg 
ggggccccag 
gctccccgcc 
tgttggaagt 
tcctgcaccc 
actacgtgct 
ggacacggcc 
tcagggtgac 
gtgtggcccc 
ggaggagatc 
tgatacgtgc 
aggcagccgc 
tgtcatcggg 
cctcatgccc 

gggagcccct 

ctgtgtcaga 
agcgcccggg 
acggccgccg 
gacgacgagt 
atctgcatcg 



cagagtctga 
ggtgtggcaa 
ccgggctcac 
tgcctctgcc 
tgggacgggg 
gggggggctg 
cagcagccct 
caggtctggg 
aggttctcct 
aacaacaagt 
tcggagcctg 
gacatcgccg 
ccccactcgt 
cagtggggcg 
tgtgtcagga 
agatgctctt 
agaccttccc 

c gg a gctgct 

acggccggca 
cgcacgaggg 



cgcgcacaaa 
gtgaggatgg 
tccatgtgag 
atgctgggcc 
gccccattgt 
ttccccctgg 
gtgtgcacca 
gtgctcctga 
caaacggcct 
cggatctgct 
tggtggccat 
cctactgcaa 
cagagctcgc 
ccccccacca 
gaatgctaca 
ggccttgcag 
ctccttcttc 
gcaggagttc 
gggcctgagc 
cctggtgccg 



ctttcaggcc 
caagggtttt 
gccccagtcg 
ctgctgtcct 
gcctgtcaca 
gcgaggccga 
ggtacagagg 
gctggggccg 
gctctgggca 
gcccgggctg 
gaagcccagc 
ctacacgcag 
catggtcacc 
tcacccaccc 
tgcaccccac 
gtcagctacg 
cgcaccgtgc 
ggctggaact 
atcttctcgg 
ctgccccgtg 



caggaagcga 
gctaaacaaa 
gggcagccac 
gggcctcagc 
gcaacttagg 
ggaggctggc 
tgggacggcc 

aggtggccat 

ctggccatga 
cgcctgggct 
ctcatgttcc 
taccagcccc 
ggcaagttct 
ccaaccaacc 
ccagccctgc 
gtgctagcat 
ccagcgaccg 
gggtggccgc 
ccctggccgc 
ccgatgactc 



60 

120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 



: ') 
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gcggctgggg 
gctgctgttc 
gctctcgccc 
gctgcccggc 
gcacgagttc 
ctctgccctg 
gcagtgtgac 
ctctgtctac 
cgcctcaggc 
gggtgtgctg 
aggtggctgg 
gaccttccac 
gtacgacctg 
gttcaacggc 
ggtgaggtga 
ctgggggtgg 
caggcctgtg 
cgccgggtca 
taccggcaaa 
agggtcctgc 
gcgcccttct 
tccccggagc 
ccggctgtgc 

"ggggctgt 
gcctgctttg 
cagcccagcc 
tgcctgagca 
agctgggcag 
ctggccatgc 
gtggtgacgg 
tgggtcagct 
ggcactttcc 
gccatgctgg 
gtggtcctca 
gctgccttcc 
gagttcttcc 
aatcagggga 
gctgcgatcc 
aggttctgac 
acgtggacac 



aaggtgcagg 
gcctccgtgc 
aaggtgtggg 
atggcccaga 
ccccagtacg 
ggcgagaggg 
tgcatcacgc 
gcagctgtgt 
tgccccgcgc 
tcctctgcat 
cggctcagcc 
gtgggcgggc 
aagctgtggg 
agcctcagga 
gggtgggtgt 
gggccgttcc 
cgcagaagcc 

aggggttcca 

acccaggtga 
caagtcctga 
cctctctcac 
gaagcacacg 
tgctgctgct 
tcgttcacca 
gcctggtgtg 
ctgcccgatg 
cactcttcct 
accggctgag 
tggtggaggt 
actggcacat 
tcggcctagc 
tggtgcggag 
cctacttcat 
ggcccgccgt 
acctgcccag 
tgggaggggg 
aacatgagtg 
cccccaagcc 
cccaggttgt 
ccctgtgacc 



acgtcctgca 
acgccgccca 
tggccagcga 
tgggcacggt 
tgaagacgca 
agcagggtct 
tgcagaacgt 
atagcgtggc 
aggaccccgt 
gtgcccaggc 
ccgtcccccg 
tgccgctgcg 
tgtggcaggg 
cagagcgcct 
gccaggcgtg 
agtctcccgt 
cgtgtcccgg 
ctcctgctgc 
gccgccttcc 
ctctgagacc 
agacgacatc 
ctgcttccgc 
cctgctgctg 
tcgggacagc 
cctgggcctg 
cctggcccag 
gcaggcggcc 
tggctgcctg 
cgcactgtgc 
gctgcccacg 
gcacgccacc 
ccagccgggc 
cacctgggtc 
gcagatgggc 
gtgttacctg 
ccctggggat 
acccaaccct 
agcaatgacc 
ctcctgaccc 
ate 



ccaggtgaac 
cgccctcttc 
ggcctggctg 
gcttggcttc 
cct 9g cc ctg 
ggaggaggac 
gagegcaggg 
ccaggccctg 
gaagccctgg 
caccaggcac 
cccgcagctc 
gttcgacagc 
ctcagtgccc 
gaagatcege 
cccgtggtag 
gggcatgccc 
tgctcgcggc 
tacgactgtg 
eggcaggegg 
agagcccaca 
gcctgcacct 
cgcaggtctc 
agcctggcgc 
ccactggttc 
gtctgcctca 
cagcccttgt 
gagatcttcg 

c gggggccct 

acctggtacc 
gaggegctgg 
aatgccacgc 
tgctacaacc 
tcctttgtgc 
gccctcctgc 
ctcatgcggc 
gcccaaggcc 
gtgatctcag 
cgtgtctcgc 
tgaccccaca 



cagagcagcg 
aactacagca 
acctctgacc 
ctccagaggg 
gccaccgacc 
gtggtgggcc 
ctaaatcacc 
cacaacactc 
caggtgagee 
ggccaccacg 
ctggagaaca 
ageggaaacg 
aggctccacg 
tggcacacgt 
cccccgcggc 
agecgagcag 
agtgccagga 
tggactgega 
gggtgggaac 
gggtacaaga 
tttgtggcca 
ggttcctggc 
tgggccttgt 
aggecteggg 
gcgtcctcct 
cccacctccc 
tggagtcaga 
gggcctggct 
tggtggcctt 
tgcactgccg 
tggectttet 
gtgcccgtgg 
ccctcctggc 
tctgtgtcct 
agecaggget 
agaatgaegg 
ccccggtgaa 
tacagagacc 
gtgageccta 



tgcaggtggt 
tcagcagcag 
tggtcatggg 
gtgcccagct 
cggccttctg 
agcgctgccc 
accagacgtc 
ttcagtgcaa 
egggagatgg 
cctgagctgg 
tgtacaacct 
tggacatgga 
acgtgggcag 
ctgacaacca 
agggegcage 
agccagaccc 
gggccaggtg 

ggegggcage 
gcagcagggg 
cgaacaccca 
ggatgagtgg 
atggggcgag 
getggctget 
ggggcccctg 
gttccctggc 
gctcacgggc 
actgcctctg 
ggtggtgctg 
cccgccggag 
cacacgctcc 
ctgcttcctg 
cctcaccttt 
caatgtgcag 
gggcatcctg 
caacaccccc 
gaacacagga 
cccagactta 
ctcccgctct 
ggcctggagc 



1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2 640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3563 



<210> 21 
<211> 839 
<212> PRT 

<213> Homo sapiens 
<400> 21 

Met Gly Pro Arg Ala Lys Thr He Cys Ser Leu Phe Phe Leu Leu Trp 
1 5 10 15 

Val Leu Ala Glu Pro Ala Glu Asn Ser Asp Phe Tyr Leu Pro Gly Asp 
20 25 ^ 30 



Tyr Leu Leu Gly Gly Leu Phe Ser Leu His Ala Asn Met Lys Gly He 
35 40 45 



) 



24 

Val His Leu Asn Phe Leu Gin Val Pro Met Cys Lys Glu Tyr Glu Val 
50 55 * 60 

Lys Val He Gly Tyr Asn Leu Met Gin Ala Met Arg Phe Ala Val Glu 
65 70 75 80 

Glu He Asn Asn Asp Ser Ser Leu Leu Pro Gly Val Leu Leu Gly Tyr 
85 90 95 

Glu He Val Asp Val Cys Tyr lie Ser Asn Asn Val Gin Pro Val Leu 
100 105 110 

Tyr Phe Leu Ala His Glu Asp Asn Leu Leu Pro He Gin Glu Asp Tyr 
115 120 125 

Ser Asn Tyr He Ser Arg Val Val Ala Val He Gly Pro Asp Asn Ser 
130 135 140 

Glu Ser Val Met Thr Val Ala Asn Phe Leu Ser Leu Phe Leu Leu Pro 
145 150 155 160 

Gin He Thr Tyr Ser Ala He Ser Asp Glu Leu Arg Asp Lys Val Arg 
165 170 ~ ~ * 175 

Phe Pro Ala Leu Leu Arg Thr Thr Pro Ser Ala Asp His His Val Glu 
180 185 ~ 190 

Ala Met Val Gin Leu Met Leu His Phe Arg Trp Asn Trp He He Val 
195 200 205 

Leu Val Ser Ser Asp Thr Tyr Gly Arg Asp Asn Gly Gin Leu Leu Gly 
210 215 220 

Glu Arg Val Ala Arg Arg Asp He Cys He Ala Phe Gin Glu Thr Leu 
225 230 235 240 

Pro Thr Leu Gin Pro Asn Gin Asn Met Thr Ser Glu Glu Arg Gin Arg 
245 250 255 

Leu Val Thr He Val Asp Lys Leu Gin Gin Ser Thr Ala Arg Val Val 
260 265 270 

Val Val Phe Ser Pro Asp Leu Thr Leu Tyr His Phe Phe Asn Glu Val 
275 280 285 

Leu Arg Gin Asn Phe Thr Gly Ala Val Trp He Ala Ser Glu Ser Trp 
290 295 300 

Ala He Asp Pro Val Leu His Asn Leu Thr Glu Leu Gly His Leu Gly 
305 310 315 ' 320 

Thr Phe Leu Gly He Thr He Gin Ser Val Pro He Pro Gly Phe Ser 
325 330 * 335 

Glu Phe Arg Glu Trp Gly Pro Gin Ala Gly Pro Pro Pro Leu Ser Arg 
340 345 ' 350 



25 

Thr Ser Gin Ser Tyr Thr Cys Asn Gin Glu Cys Asp Asn Cys Leu Asn 
355 360 365 

Ala Thr Leu Ser Phe Asn Thr He Leu Arg Leu Ser Gly Glu Arg Val 
370 375 380 

Val Tyr Ser Val Tyr Ser Ala Val Tyr Ala Val Ala His Ala Leu His 
385 390 395 400 

Ser Leu Leu Gly Cys Asp Lys Ser Thr Cys Thr Lys Arg Val Val Tyr 
405 4io ~~ 4i5 

Pro Trp Gin Leu Leu Glu Glu He Trp Lys Val Asn Phe Thr Leu Leu 
4 20 425 430 

Asp His Gin He Phe Phe Asp Pro Gin Gly Asp Val Ala Leu His Leu 
435 440 * 445 

Glu He Val Gin Trp Gin Trp Asp Arg Ser Gin Asn Pro Phe Gin Ser 
450 455 460 v 

Val Ala Ser Tyr Tyr Pro Leu Gin Arg Gin Leu Lys Asn He Gin Asp 
465 470 475 480 

He Ser Trp His Thr Val Asn Asn Thr He Pro Met Ser Met Cys Ser 
485 490 495 

Lys Arg Cys Gin Ser Gly Gin Lys Lys Lys Pro Val Gly He His Val 
500 505 510 

Cys Cys Phe Glu Cys He Asp Cys Leu Pro Gly Thr Phe Leu Asn His 
515 520 525 

Thr Glu Asp Glu Tyr Glu Cys Gin Ala Cys Pro Asn Asn Glu Trp Ser 
530 535 540 

Tyr Gin Ser Glu Thr Ser Cys Phe Lys Arg Gin Leu Val Phe Leu Glu 
545 550 555 560 

Trp His Glu Ala Pro Thr lie Ala Val Ala Leu Leu Ala Ala Leu Gly 
565 570 575 

Phe Leu Ser Thr Leu Ala He Leu Val He Phe Trp Arg His Phe Gin 
580 585 590 

Thr Pro He Val Arg Ser Ala Gly Gly Pro Met Cys Phe Leu Met Leu 
595 ^ 600 605 

Thr Leu Leu Leu Val Ala Tyr Met Val Val Pro Val Tyr Val Gly Pro 
610 615 620 

Pro Lys Val Ser Thr Cys Leu Cys Arg Gin Ala Leu Phe Pro Leu Cys 
625 630 635 640 

Phe Thr He Cys He Ser Cys He Ala Val Arg Ser Phe Gin He Val 
645 650 655 



) 
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Cys Ala Phe Lys Met Ala Ser Arg Phe Pro Arg Ala Tyr Ser Tyr Trp 
660 665 670 

Val Arg Tyr Gin Gly Pro Tyr Val Ser Met Ala Phe He Thr Val Leu 
675 680 685 

Lys Met Val lie Val Val lie Gly Met Leu Ala Thr Gly Leu Ser Pro 
690 695 700 



Thr Thr Arg Thr 
705 

Asn Pro Asn Tyr 



Leu Leu Ser Val 
740 

Pro Thr Asn Tyr 
755 

Tyr Phe Thr Ser 
770 

Gly Val Leu Val 
785 

Leu Ala He Ser 



Phe Tyr Pro Glu 
820 

Gly Tyr Thr Met 
835 



Asp Pro Asp Asp 
710 

Arg Asn Ser Leu 
725 

Val Gly Phe Ser 



Asn Glu Ala Lys 
760 

Ser Val Ser Leu 
775 

Thr He Val Asp 
790 

Leu Gly Tyr Phe 
805 

Arg Asn Thr Pro 



Arg Arg Asp 



Pro Lys He Thr 
715 

Leu Phe Asn Thr 
730 

Phe Ala Tyr Met 
745 

Phe He Thr Leu 



Cys Thr Phe Met 
780 

Leu Leu Val Thr 
795 

Gly Pro Lys Cys 
810 

Ala Tyr Phe Asn 
825 



He Val Ser Cys 
720 

Ser Leu Asp Leu 
735 

Gly Lys Glu Leu 
750 

Ser Met Thr Phe 
765 

Ser Ala Tyr Ser 



Val Leu Asn Leu 
800 

Tyr Met He Leu 
815 

Ser Met He Gin 
830 



<210> 22 
<211> 6 
<212> PRT 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Synthetic 
PDZIP peptide sequence 

<400> 22 

Ser Val Ser Thr Val Val 
1 5 



<210> 23 
<211> 2520 
<212> DNA 

<213> Homo sapiens 
<400> 23 

atggggccca gggcaaagac catctgctcc ctgttcttcc tcctatgggt cctggctgag 



27 



ccggctgaga 
ctccatgcca 
gagtatgaag 
gagatcaaca 
gtgtgctaca 
ctccttccca 
cctgacaact 
cagatcacct 
ctgcgtacca 
ttccgctgga 
cagctgcttg 
cccacactgc 
gtggacaagc 
ctgtaccact 
tccgagtcct 
accttcctgg 
tggggcccac 
caggagtgcg 
ggggagcgtg 
agcctcctcg 
cttgaggaga 
caaggggacg 
cccttccaga 
atctcctggc 
tcagggcaaa 
cttcccggca 
aacgagtggt 
tggcatgagg 
ctggccatcc 
ggccccatgt 
tacgtggggc 
ttcacaattt 
atggccagcc 
tctatggcat 
ggcctcagtc 
aaccccaact 
gtgggtttca 
ttcatcaccc 
tctgcctaca 
ctggccatca 
cgcaacacgc 



actcggactt 
acatgaaggg 
tgaaggtgat 
atgacagcag 
tctccaacaa 
tccaagagga 
ccgagtctgt 
acagcgccat 
cacccagcgc 
actggatcat 
gcgagcgcgt 
agcccaacca 
tgcagcagag 
tcttcaatga 
gggccatcga 
gcatcaccat 
aggctgggcc 
acaactgcct 
tcgtctacag 
gctgtgacaa 
tctggaaggt 
tggctctgca 
gcgtcgcctc 
acaccgtcaa 
agaagaagcc 
ccttcctcaa 
cctaccagag 
cacccaccat 
tggtgatatt 
gcttcctgat 
cgcccaaggt 
gcatctcctg 
gcttcccacg 
ttatcacggt 
ccaccacccg 
accgcaacag 
gcttcgccta 
tcagcatgac 
gcggggtgct 
gcctgggcta 
ccgcctactt 



ctacctgcct 
cattgttcac 
aggctacaac 
cctgctgcct 
tgtccagccg 
ctacagtaac 
catgactgtg 
cagcgatgag 
cgaccaccac 
tgtgctggtg 
ggcccggcgc 
gaacatgacg 
cacagcgcgc 
ggtgctgcgc 
cccggtcctg 
ccagagcgtg 
gccacccctc 
gaacgccacc 
cgtgtactct 
aagcacctgc 
caacttcact 
cttggagatt 
ctactacccc 
caacacgatc 

tgtgggcatc 

ccacactgaa 
tgagacctcc 
cgctgtggcc 
ctggaggcac 
gctgacactg 
ctccacctgc 
tatcgccgtg 
cgcctacagc 
actcaaaatg 
tactgacccc 
cctgctgttc 
catgggcaaa 
cttctatttc 
ggtcaccatc 
cttcggcccc 
caacagcatg 



ggggattacc 
cttaacttcc 
ctcatgcagg 

ggtgtgctgc 

gtgctctact 
tacatttccc 
gccaacttcc 
ctgcgagaca 
gtcgaggcca 
agcagcgaca 
gacatctgca 
tcagaggagc 
gtcgtggtcg 
cagaacttca 
cacaacctca 
cccatcccgg 
agcaggacca 
ttgtccttca 
gcggtctatg 
accaagaggg 
ctcctggacc 
gtccagtggc 
ctgcagcgac 
cctatgtcca 
cacgtctgct 
gatgaatatg 
tgcttcaagc 
ctgctggccg 
ttccagacac 
ctgctggtgg 
ctctgccgcc 
cgttctttcc 
tactgggtcc 
gtcattgtgg 
gatgacccca 
aacaccagcc 
gagctgccca 
acctcatccg 
gtggacctct 
aagtgctaca 
atccagggct 



tcctgggtgg 
tgcaggtgcc 
ccatgcgctt 
tgggctatga 
tcctggcaca 
gtgtggtggc 
tctccctatt 
aggtgcgctt 
tggtgcagct 
cctatggccg 
tcgccttcca 
gccagcgcct 
tgttctcgcc 
cgggcgccgt 
cggagctggg 
gcttcagtga 
gccagagcta 
acaccattct 
ctgtggccca 
tggtctaccc 
accaaatctt 
aatgggaccg 
agctgaagaa 
tgtgttccaa 
gcttcgagtg 
aatgccaggc 
ggcagctggt 
ccctgggctt 
ccatagttcg 
catacatggt 
aggccctctt 
agatcgtctg 
gctaccaggg 
taattggcat 
agatcacaat 
tggacctgct 
ccaactacaa 
tctccctctg 
tggtcactgt 
tgatcctctt 
acaccatgag 



cctcttctcc 
catgtgcaag 
cgcggtggag 
gatcgtggat 
cgaggacaac 
tgtcattggc 
tctccttcca 
cccggctttg 
gatgctgcac 
cgacaatggc 
ggagacgctg 
ggtgaccatt 
cgacctgacc 
gtggatcgcc 
ccacttgggc 
gttccgcgag 
tacctgcaac 
caggctctct 
tgccctgcac 
ctggcagctg 
cttcgacccg 
gagccagaat 
catccaagac 
gaggtgccag 
catcgactgc 
ctgcccgaat 
cttcctggaa 
cctcagcacc 
ctcggctggg 
ggtcccggtg 
tcccctctgc 
cgccttcaag 
gccctacgtc 
gctggccacg 
tgtctcctgt 
gctctcagtg 
cgaggccaag 
caccttcatg 
gctcaacctc 
ctacccggag 
gagggactag 



120 

180 

240 

300 

360 

420 

480 

540 

600 

660 

720 

780 

840 

900 

960 

1020 

1080 

1140 

1200 

1260 

1320 

1380 

1440 

1500 

1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 



<210> 24 
<211> 6 
<212> PRT 

<213> Artificial Sequence 
<220> 

<223> Description of Artificial Sequence: Six-His tag 



<400> 24 

His His His His His His 
1 5 



